from xml.etree.ElementTree import ElementTree, Element


def read_xml(in_path):  
    '''''读取并解析xml文件 
       in_path: xml路径 
       return: ElementTree'''  
    tree = ElementTree()  
    tree.parse(in_path)  
    return tree  
  
def write_xml(tree, out_path):  
    '''''将xml文件写出 
       tree: xml树 
       out_path: 写出路径'''  
    tree.write(out_path, encoding="utf-8",xml_declaration=True)  
  
def if_match(node, kv_map):  
    '''''判断某个节点是否包含所有传入参数属性 
       node: 节点 
       kv_map: 属性及属性值组成的map'''  
    for key in kv_map:  
        if node.get(key) != kv_map.get(key):  
            return False  
    return True  
  
#---------------search -----  
  
def find_nodes(tree, path):  
    '''''查找某个路径匹配的所有节点 
       tree: xml树 
       path: 节点路径'''  
    return tree.findall(path)  
  
  
def get_node_by_keyvalue(nodelist, kv_map):  
    '''''根据属性及属性值定位符合的节点，返回节点 
       nodelist: 节点列表 
       kv_map: 匹配属性及属性值map'''  
    result_nodes = []  
    for node in nodelist:  
        if if_match(node, kv_map):  
            result_nodes.append(node)  
    return result_nodes  
  
#---------------change -----  
  
def change_node_properties(nodelist, kv_map, is_delete=False):  
    '''''修改/增加 /删除 节点的属性及属性值 
       nodelist: 节点列表 
       kv_map:属性及属性值map'''  
    for node in nodelist:  
        for key in kv_map:  
            if is_delete:   
                if key in node.attrib:  
                    del node.attrib[key]  
            else:  
                node.set(key, kv_map.get(key))  
              
def change_node_text(nodelist, text, is_add=False, is_delete=False):  
    '''''改变/增加/删除一个节点的文本 
       nodelist:节点列表 
       text : 更新后的文本'''  
    for node in nodelist:  
        if is_add:  
            node.text += text  
        elif is_delete:  
            node.text = ""  
        else:  
            node.text = text  
              
def create_node(tag, property_map, content):  
    '''''新造一个节点 
       tag:节点标签 
       property_map:属性及属性值map 
       content: 节点闭合标签里的文本内容 
       return 新节点'''  
    element = Element(tag, property_map)  
    element.text = content  
    return element  
          
def add_child_node(nodelist, element):  
    '''''给一个节点添加子节点 
       nodelist: 节点列表 
       element: 子节点'''  
    for node in nodelist:  
        node.append(element)  
          
def del_node_by_tagkeyvalue(nodelist, tag, kv_map):  
    '''''同过属性及属性值定位一个节点，并删除之 
       nodelist: 父节点列表 
       tag:子节点标签 
       kv_map: 属性及属性值列表'''  
    for parent_node in nodelist:  
        children = parent_node.getchildren()  
        for child in children:  
            if child.tag == tag and if_match(child, kv_map):  
                parent_node.remove(child)  
                          
  
  
# if __name__ == "__main__":  
      
#     #1. 读取xml文件  
#     tree = read_xml("./test.xml")  
      
#     #2. 属性修改  
#       #A. 找到父节点  
#     nodes = find_nodes(tree, "processers/processer")  
#       #B. 通过属性准确定位子节点  
#     result_nodes = get_node_by_keyvalue(nodes, {"name":"BProcesser"})  
#       #C. 修改节点属性  
#     change_node_properties(result_nodes, {"age": "1"})  
#       #D. 删除节点属性  
#     change_node_properties(result_nodes, {"value":""}, True)  
      
#     #3. 节点修改  
#       #A.新建节点  
#     a = create_node("person", {"age":"15","money":"200000"}, "this is the firest content")  
#       #B.插入到父节点之下  
#     add_child_node(result_nodes, a)  
      
#     #4. 删除节点  
#        #定位父节点  
#     del_parent_nodes = find_nodes(tree, "processers/services/service")  
#        #准确定位子节点并删除之  
#     target_del_node = del_node_by_tagkeyvalue(del_parent_nodes, "chain", {"sequency" : "chain1"})  
      
#     #5. 修改节点文本  
#        #定位节点  
#     text_nodes = get_node_by_keyvalue(find_nodes(tree, "processers/services/service/chain"), {"sequency":"chain3"})  
#     change_node_text(text_nodes, "new text")  
      
#     #6. 输出到结果文件  
#     write_xml(tree, "./out.xml")  
    




import  xml.etree.ElementTree as ET
  
def getXml(fileName):
    root = ET.parse(fileName).getroot() #获得根节点  
    resultList = []
    walkXml(root,resultList,'')
    return resultList  
  
def walkXml(root,resultList,tempLists):
    #if tempLists == 'root':
    #    tempLists = ""  
    tempList = tempLists+',"'+root.tag+'"'
    resultList.append(tempList)
    children_node = root.getchildren()
    if len(children_node) == 0:
        return  
    for child in children_node:
        walkXml(child,resultList,tempList)
    return  
  
# if __name__ == "__main__":  
#     file_name = "test.xml"  
#     R = getXml(file_name)  
#     for r in R:  
#         print "{"+r[1:]+"}"  


#导入lxml库
from lxml import etree
#首先根据dtd得到一个parser(注意dtd文件要放在和xml文件相同的目录)
parser=etree.XMLParser(load_dtd= True)
#用上面得到的parser将xml解析为树结构
tree = etree.parse(r"F:\chen\pythonworkspace\PythonGithub\TestFile\EMR-PL-01新增个人身份注册-F.xml",parser)
#获得该树的树根
root = tree.getroot()


#这样便可以遍历根元素的所有子元素(这里是article元素)
for article in root:
    #用.tag得到该子元素的名称
    print(元素名称：",article.tag)
    #遍历article元素的所有子元素(这里是指article的author，title，volume，year等)
    for field in article:
        #同样地，用.tag可以得到元素的名称，而.text可以得到元素的内容
        print field.tag,":",field.text
    #用.get("属性名")可以得到article元素相应属性的值
    mdate=article.get("mdate")
    key=article.get("key")
    print(mdate:", mdate)
    print("key",key)
    #隔行分开不同的article元素
    print ("")


